# SOME DESCRIPTIVE TITLE.
# Copyright (C) 2021, PaddleNLP
# This file is distributed under the same license as the PaddleNLP package.
# FIRST AUTHOR <EMAIL@ADDRESS>, 2022.
#
#, fuzzy
msgid ""
msgstr ""
"Project-Id-Version: PaddleNLP \n"
"Report-Msgid-Bugs-To: \n"
"POT-Creation-Date: 2022-03-18 21:31+0800\n"
"PO-Revision-Date: YEAR-MO-DA HO:MI+ZONE\n"
"Last-Translator: FULL NAME <EMAIL@ADDRESS>\n"
"Language-Team: LANGUAGE <LL@li.org>\n"
"MIME-Version: 1.0\n"
"Content-Type: text/plain; charset=utf-8\n"
"Content-Transfer-Encoding: 8bit\n"
"Generated-By: Babel 2.9.0\n"

#: ../source/paddlenlp.transformers.xlnet.tokenizer.rst:2
msgid "tokenizer"
msgstr ""

#: of paddlenlp.transformers.xlnet.tokenizer:1
msgid "Tokenization class for XLNet model."
msgstr ""

#: of paddlenlp.transformers.xlnet.tokenizer.XLNetTokenizer:1
msgid "基类：:class:`paddlenlp.transformers.tokenizer_utils.PretrainedTokenizer`"
msgstr ""

#: of paddlenlp.transformers.xlnet.tokenizer.XLNetTokenizer:1
msgid ""
"Constructs an XLNet tokenizer based on `SentencePiece "
"<https://github.com/google/sentencepiece>`__."
msgstr ""

#: of paddlenlp.transformers.xlnet.tokenizer.XLNetTokenizer:3
msgid ""
"This tokenizer inherits from "
":class:`~paddlenlp.transformers.tokenizer_utils.PretrainedTokenizer` "
"which contains most of the main methods. For more information regarding "
"those methods, please refer to this superclass."
msgstr ""

#: of paddlenlp.transformers.xlnet.tokenizer.XLNetTokenizer
#: paddlenlp.transformers.xlnet.tokenizer.XLNetTokenizer.build_inputs_with_special_tokens
#: paddlenlp.transformers.xlnet.tokenizer.XLNetTokenizer.build_offset_mapping_with_special_tokens
#: paddlenlp.transformers.xlnet.tokenizer.XLNetTokenizer.convert_tokens_to_string
#: paddlenlp.transformers.xlnet.tokenizer.XLNetTokenizer.create_token_type_ids_from_sequences
#: paddlenlp.transformers.xlnet.tokenizer.XLNetTokenizer.get_special_tokens_mask
#: paddlenlp.transformers.xlnet.tokenizer.XLNetTokenizer.num_special_tokens_to_add
#: paddlenlp.transformers.xlnet.tokenizer.XLNetTokenizer.save_resources
msgid "参数"
msgstr ""

#: of paddlenlp.transformers.xlnet.tokenizer.XLNetTokenizer:7
msgid ""
"The vocabulary file (ends with '.spm') required to instantiate a "
"`SentencePiece <https://github.com/google/sentencepiece>`__ tokenizer."
msgstr ""

#: of paddlenlp.transformers.xlnet.tokenizer.XLNetTokenizer:10
msgid ""
"Whether or not to lowercase the input when tokenizing. Defaults to "
"`False` and **does not** lowercase the input."
msgstr ""

#: of paddlenlp.transformers.xlnet.tokenizer.XLNetTokenizer:13
msgid ""
"Whether or not to strip the text when tokenizing. Defaults to `True` and "
"removes excess spaces before and after the string."
msgstr ""

#: of paddlenlp.transformers.xlnet.tokenizer.XLNetTokenizer:16
msgid ""
"Whether or not to keep accents when tokenizing. Defaults to `False` and "
"**does not** keep accents."
msgstr ""

#: of paddlenlp.transformers.xlnet.tokenizer.XLNetTokenizer:18
msgid ""
"A special token representing the beginning of a sequence that was used "
"during pretraining. Defaults to `\"<s>\"`."
msgstr ""

#: of paddlenlp.transformers.xlnet.tokenizer.XLNetTokenizer:21
msgid ""
"A special token representing the end of a sequence that was used during "
"pretraining. Defaults to `\"</s>\"`."
msgstr ""

#: of paddlenlp.transformers.xlnet.tokenizer.XLNetTokenizer:24
msgid ""
"A special token representing the *unknown (out-of-vocabulary)* token. An "
"unknown token is set to be `unk_token` inorder to be converted to an ID. "
"Defaults to `\"<unk>\"`."
msgstr ""

#: of paddlenlp.transformers.xlnet.tokenizer.XLNetTokenizer:28
msgid ""
"A special token separating two different sentences in the same input. "
"Defaults to `\"<sep>\"`."
msgstr ""

#: of paddlenlp.transformers.xlnet.tokenizer.XLNetTokenizer:31
msgid ""
"A special token used to make arrays of tokens the same size for batching "
"purposes. Defaults to `\"<pad>\"`."
msgstr ""

#: of paddlenlp.transformers.xlnet.tokenizer.XLNetTokenizer:34
msgid ""
"A special token used for sequence classification. It is the last token of"
" the sequence when built with special tokens. Defaults to `\"<cls>\"`."
msgstr ""

#: of paddlenlp.transformers.xlnet.tokenizer.XLNetTokenizer:37
msgid ""
"A special token representing a masked token. This is the token used in "
"the masked language modeling task which the model tries to predict the "
"original unmasked ones. Defaults to `\"<mask>\"`."
msgstr ""

#: of paddlenlp.transformers.xlnet.tokenizer.XLNetTokenizer:41
msgid ""
"A list of additional special tokens to be used by the tokenizer. Defaults"
" to `[\"<eop>\", \"<eod>\"]`."
msgstr ""

#: of paddlenlp.transformers.xlnet.tokenizer.XLNetTokenizer:47
msgid ""
"The *SentencePiece* processor that is used for every conversion (string, "
"tokens and IDs)."
msgstr ""

#: of paddlenlp.transformers.xlnet.tokenizer.XLNetTokenizer
msgid "type"
msgstr ""

#: of paddlenlp.transformers.xlnet.tokenizer.XLNetTokenizer:49
msgid "SentencePieceProcessor"
msgstr ""

#: of
#: paddlenlp.transformers.xlnet.tokenizer.XLNetTokenizer.convert_tokens_to_string:1
msgid ""
"Converts a sequence of tokens (list of string) to a single string by "
"using ``' '.join(tokens)`` ."
msgstr ""

#: of
#: paddlenlp.transformers.xlnet.tokenizer.XLNetTokenizer.convert_tokens_to_string:4
msgid "A sequence of tokens."
msgstr ""

#: of
#: paddlenlp.transformers.xlnet.tokenizer.XLNetTokenizer.build_inputs_with_special_tokens
#: paddlenlp.transformers.xlnet.tokenizer.XLNetTokenizer.build_offset_mapping_with_special_tokens
#: paddlenlp.transformers.xlnet.tokenizer.XLNetTokenizer.convert_tokens_to_string
#: paddlenlp.transformers.xlnet.tokenizer.XLNetTokenizer.create_token_type_ids_from_sequences
#: paddlenlp.transformers.xlnet.tokenizer.XLNetTokenizer.get_special_tokens_mask
#: paddlenlp.transformers.xlnet.tokenizer.XLNetTokenizer.num_special_tokens_to_add
msgid "返回"
msgstr ""

#: of
#: paddlenlp.transformers.xlnet.tokenizer.XLNetTokenizer.convert_tokens_to_string:7
msgid "Converted string."
msgstr ""

#: of
#: paddlenlp.transformers.xlnet.tokenizer.XLNetTokenizer.build_inputs_with_special_tokens
#: paddlenlp.transformers.xlnet.tokenizer.XLNetTokenizer.build_offset_mapping_with_special_tokens
#: paddlenlp.transformers.xlnet.tokenizer.XLNetTokenizer.convert_tokens_to_string
#: paddlenlp.transformers.xlnet.tokenizer.XLNetTokenizer.create_token_type_ids_from_sequences
#: paddlenlp.transformers.xlnet.tokenizer.XLNetTokenizer.get_special_tokens_mask
#: paddlenlp.transformers.xlnet.tokenizer.XLNetTokenizer.num_special_tokens_to_add
msgid "返回类型"
msgstr ""

#: of
#: paddlenlp.transformers.xlnet.tokenizer.XLNetTokenizer.num_special_tokens_to_add:1
msgid ""
"Returns the number of added tokens when encoding a sequence with special "
"tokens."
msgstr ""

#: of
#: paddlenlp.transformers.xlnet.tokenizer.XLNetTokenizer.num_special_tokens_to_add:3
msgid ""
"Whether the input is a sequence pair or a single sequence. Defaults to "
"`False` and the input is a single sequence."
msgstr ""

#: of
#: paddlenlp.transformers.xlnet.tokenizer.XLNetTokenizer.num_special_tokens_to_add:7
msgid "Number of tokens added to sequences."
msgstr ""

#: of
#: paddlenlp.transformers.xlnet.tokenizer.XLNetTokenizer.build_inputs_with_special_tokens:1
msgid ""
"Builds model inputs from a sequence or a pair of sequence for sequence "
"classification tasks by concatenating and adding special tokens. An XLNet"
" sequence has the following format:"
msgstr ""

#: of
#: paddlenlp.transformers.xlnet.tokenizer.XLNetTokenizer.build_inputs_with_special_tokens:5
msgid "single sequence:      ``X <sep> <cls>``"
msgstr ""

#: of
#: paddlenlp.transformers.xlnet.tokenizer.XLNetTokenizer.build_inputs_with_special_tokens:6
msgid "pair of sequences:    ``A <sep> B <sep> <cls>``"
msgstr ""

#: of
#: paddlenlp.transformers.xlnet.tokenizer.XLNetTokenizer.build_inputs_with_special_tokens:8
msgid "List of IDs for the first sequence."
msgstr ""

#: of
#: paddlenlp.transformers.xlnet.tokenizer.XLNetTokenizer.build_inputs_with_special_tokens:10
msgid "Optional second list of IDs for the second sequenze. Defaults to `None`."
msgstr ""

#: of
#: paddlenlp.transformers.xlnet.tokenizer.XLNetTokenizer.build_inputs_with_special_tokens:13
msgid "List of input IDs with the appropriate special tokens."
msgstr ""

#: of
#: paddlenlp.transformers.xlnet.tokenizer.XLNetTokenizer.build_offset_mapping_with_special_tokens:1
msgid ""
"Builds offset map from a pair of offset map by concatenating and adding "
"offsets of special tokens."
msgstr ""

#: of
#: paddlenlp.transformers.xlnet.tokenizer.XLNetTokenizer.build_offset_mapping_with_special_tokens:4
msgid "An XLNet offset_mapping has the following format:"
msgstr ""

#: of
#: paddlenlp.transformers.xlnet.tokenizer.XLNetTokenizer.build_offset_mapping_with_special_tokens:6
msgid "single sequence:      ``X (0,0) (0,0)``"
msgstr ""

#: of
#: paddlenlp.transformers.xlnet.tokenizer.XLNetTokenizer.build_offset_mapping_with_special_tokens:7
msgid "pair of sequences:    ``A (0,0) B (0,0) (0,0)``"
msgstr ""

#: of
#: paddlenlp.transformers.xlnet.tokenizer.XLNetTokenizer.build_offset_mapping_with_special_tokens:9
msgid "List of char offsets to which the special tokens will be added."
msgstr ""

#: of
#: paddlenlp.transformers.xlnet.tokenizer.XLNetTokenizer.build_offset_mapping_with_special_tokens:11
msgid ""
"Optional second list of char offsets for offset mapping pairs. Defaults "
"to `None`."
msgstr ""

#: of
#: paddlenlp.transformers.xlnet.tokenizer.XLNetTokenizer.build_offset_mapping_with_special_tokens:15
msgid "A list of char offsets with the appropriate offsets of special tokens."
msgstr ""

#: of
#: paddlenlp.transformers.xlnet.tokenizer.XLNetTokenizer.get_special_tokens_mask:1
msgid ""
"Creates a special tokens mask from the input sequences. This method is "
"called when adding special tokens using the tokenizer `encode` method."
msgstr ""

#: of
#: paddlenlp.transformers.xlnet.tokenizer.XLNetTokenizer.create_token_type_ids_from_sequences:22
#: paddlenlp.transformers.xlnet.tokenizer.XLNetTokenizer.get_special_tokens_mask:4
msgid "A list of `inputs_ids` for the first sequence."
msgstr ""

#: of
#: paddlenlp.transformers.xlnet.tokenizer.XLNetTokenizer.create_token_type_ids_from_sequences:24
#: paddlenlp.transformers.xlnet.tokenizer.XLNetTokenizer.get_special_tokens_mask:6
msgid ""
"Optional second list of `inputs_ids` for the second sequence. Defaults to"
" `None`."
msgstr ""

#: of
#: paddlenlp.transformers.xlnet.tokenizer.XLNetTokenizer.get_special_tokens_mask:9
msgid ""
"Whether or not the token list already contains special tokens for the "
"model. Defaults to `False`."
msgstr ""

#: of
#: paddlenlp.transformers.xlnet.tokenizer.XLNetTokenizer.get_special_tokens_mask:13
msgid ""
"A list of integers which is either 0 or 1: 1 for a special token, 0 for a"
" sequence token."
msgstr ""

#: of
#: paddlenlp.transformers.xlnet.tokenizer.XLNetTokenizer.create_token_type_ids_from_sequences:1
msgid ""
"Creates a token_type mask from the input sequences. If `token_ids_1` is "
"not `None`, then a sequence pair token_type mask has the following "
"format:"
msgstr ""

#: of
#: paddlenlp.transformers.xlnet.tokenizer.XLNetTokenizer.create_token_type_ids_from_sequences:10
msgid ""
"Else if `token_ids_1` is `None`, then a single sequence token_type mask "
"has the following format:"
msgstr ""

#: of
#: paddlenlp.transformers.xlnet.tokenizer.XLNetTokenizer.create_token_type_ids_from_sequences:18
msgid "0 stands for the segment id of **first segment tokens**,"
msgstr ""

#: of
#: paddlenlp.transformers.xlnet.tokenizer.XLNetTokenizer.create_token_type_ids_from_sequences:19
msgid "1 stands for the segment id of **second segment tokens**,"
msgstr ""

#: of
#: paddlenlp.transformers.xlnet.tokenizer.XLNetTokenizer.create_token_type_ids_from_sequences:20
msgid "2 stands for the segment id of **cls_token**."
msgstr ""

#: of
#: paddlenlp.transformers.xlnet.tokenizer.XLNetTokenizer.create_token_type_ids_from_sequences:28
msgid "List of token type IDs according to the given sequence(s)."
msgstr ""

#: of paddlenlp.transformers.xlnet.tokenizer.XLNetTokenizer.save_resources:1
msgid ""
"Saves `SentencePiece <https://github.com/google/sentencepiece>`__ file "
"(ends with '.spm') under `save_directory`."
msgstr ""

#: of paddlenlp.transformers.xlnet.tokenizer.XLNetTokenizer.save_resources:4
msgid "Directory to save files into."
msgstr ""

